<!DOCTYPE html>
<html lang="en">

  <head>

    <meta charset="utf-8">
    <meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
    <meta name="description" content="Excalibur, PDF, Parsing, Table, Extraction, OCR">
    <meta name="author" content="Vinayak, Mehta, Nikhil, Sikka">

    <title>Excalibur | PDF Table Extraction for Humans</title>

    <!-- Bootstrap core CSS -->
    <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/4.1.3/css/bootstrap.min.css" integrity="sha256-eSi1q2PG6J7g7ib17yAaWMcrr5GrtohYChqibrV7PBE=" crossorigin="anonymous" />

    <!-- Custom fonts for this template -->
    <link rel="stylesheet" href="https://use.fontawesome.com/releases/v5.5.0/css/all.css" integrity="sha384-B4dIYHKNBt8Bc12p+WXckhzcICo0wtJAoU8YZTY5qE0Id1GSseTk6S+L3BlXeVIU" crossorigin="anonymous">

    <link href="https://fonts.googleapis.com/css?family=Montserrat:400,700" rel="stylesheet" type="text/css">
    <link href="https://fonts.googleapis.com/css?family=Lato:400,700,400italic,700italic" rel="stylesheet" type="text/css">

    <!-- Custom styles for this template -->
    <link href="css/index.min.css" rel="stylesheet">

  </head>

  <body id="page-top">

    <!-- Navigation -->
    <nav class="navbar navbar-expand-lg bg-secondary fixed-top text-uppercase" id="mainNav">
      <div class="container">
        <a class="navbar-brand js-scroll-trigger" href="#page-top">Excalibur</a>
        <button class="navbar-toggler navbar-toggler-right text-uppercase bg-primary text-white rounded" type="button" data-toggle="collapse" data-target="#navbarResponsive" aria-controls="navbarResponsive" aria-expanded="false" aria-label="Toggle navigation">
          Menu
          <i class="fas fa-bars"></i>
        </button>
        <div class="collapse navbar-collapse" id="navbarResponsive">
          <ul class="navbar-nav ml-auto">
            <li class="nav-item mx-0 mx-lg-1">
              <a class="nav-link py-3 px-0 px-lg-3 rounded js-scroll-trigger" href="#about">About</a>
            </li>
            <li class="nav-item mx-0 mx-lg-1">
              <a class="nav-link py-3 px-0 px-lg-3 rounded js-scroll-trigger" href="#usage">Usage</a>
            </li>
            <li class="nav-item mx-0 mx-lg-1">
              <a class="nav-link py-3 px-0 px-lg-3 rounded js-scroll-trigger" href="#download">Download</a>
            </li>
            <li class="nav-item mx-0 mx-lg-1">
              <a class="nav-link py-3 px-0 px-lg-3 rounded js-scroll-trigger" href="#team">Team</a>
            </li>
          </ul>
        </div>
      </div>
    </nav>

    <!-- Header -->
    <header class="masthead bg-primary text-white">
      <div class="container">
        <div class="row">
          <div class="col-md-6 col-sm-12 col-xs-12 text-center">
            <img src="https://excalibur-py.readthedocs.io/en/master/_static/excalibur-logo-circle.png" class="rounded-circle img-fluid mb-5 d-block mx-auto"
              width="150" height="auto" alt="Excalibur">
            <hr class="star-light">
            <h1 class="text-uppercase mb-1 lead">Excalibur</h1>
            <h4 class="mb-4 mt-3">PDF Table Extraction for Humans</h4>
            <a class="github-button" href="https://github.com/camelot-dev/excalibur" data-size="large" data-show-count="true" aria-label="Star camelot-dev/excalibur on GitHub">Star</a>
          </div>
          <div class="col-md-4 offset-md-2 offset-sm-0 col-sm-12 col-xs-12 mt-4">
            <div>
              <h4 class="lead">Do you have feedback or want us to build a new feature? Just holler!</h4>
              <hr>
            </div>
            <div class="d-flex align-items-center justify-content-center mt-2">
              <form action="https://formspree.io/vmehta94@gmail.com" method="POST">
                <label class="text-white" for="emailID">E-mail</label>
                <input class="form-control form-control-lg mb-3" type="email" name="emailID" id="email" placeholder="example@domain.com">

                <label class="text-white" for="comment">Message</label>
                <textarea class="form-control form-control-lg mb-3" name="comment" id="comment" cols="30" rows="5" placeholder="Give us feedback, tell us about your awesome use case or just say hello!"></textarea>

                <div class="text-right">
                  <button type="submit" value="Send" class="btn btn-lg btn-block btn-accent">Submit</button>
                </div>
              </form>
            </div>
          </div>
        </div>
      </div>
    </header>

    <!-- About Section -->
    <section class="text-secondary mb-0" id="about">
      <div class="container-fluid">
        <h2 class="text-center text-uppercase text-secondary">About</h2>
        <hr class="star-dark mb-5">
      </div>
      <div class="container">
        <div class="row">
          <div class="col-lg-6">
            <div class="media mt-4">
              <h3><i class="fa fa-table text-accent mr-3"></i></h3>
              <div class="media-body">
                <h5 class="mb-1 text-accent">Extracting tables from PDFs is hard</h5>
                <p class="lead text-helper">The Portable Document Format (PDF) was not designed for tabular data. Sadly, a lot of open data is shared as PDFs and getting tables out for analysis and record-keeping is a pain. <strong class="font-weight-bold">Excalibur makes PDF table extraction very easy.</strong> You can download the extracted tables as CSVs or an Excel spreadsheet. All data remains on your machine.</p>
              </div>
            </div>
          </div>
          <div class="col-lg-6">
            <div class="media mt-4">
              <h3><i class="fa fa-wrench text-accent mr-3"></i></h3>
              <div class="media-body">
                <h5 class="mb-1 text-accent">Why another tool?</h5>
                <p class="lead text-helper">There are both open and closed-source tools that are widely used for PDF table extraction. They either give a nice output or fail miserably. Excalibur is powered by <a href="https://camelot-py.readthedocs.io">Camelot</a> (written by one of the authors) which gives users complete control over table extraction. If you don't get the desired output with default settings, you can tweak them and get the job done!</p>
              </div>
            </div>
          </div>
          <div class="col-lg-6">
            <div class="media mt-4">
              <h3><i class="fa fa-cubes text-accent mr-3"></i></h3>
              <div class="media-body">
                <h5 class="mb-1 text-accent">Automate your workflow</h5>
                <p class="lead text-helper">Excalibur can detect tables in your PDFs automatically. For cases where it doesn't, you can tweak table extraction settings, save them as presets and then apply them on different PDFs with similar table structures. After v0.5.0, Excalibur will have a web API which can be used to start table extraction jobs and download extracted tables when jobs finish.</p>
              </div>
            </div>
          </div>
          <div class="col-lg-6">
            <div class="media mt-4">
              <h3><i class="fa fa-rocket text-accent mr-3"></i></h3>
              <div class="media-body">
                <h5 class="mb-1 text-accent">Built for scale</h5>
                <p class="lead text-helper">Excalibur can be configured with MySQL and <a href="http://www.celeryproject.org/" target="_blank">Celery</a> to execute table extraction jobs in a parallel and distributed manner. By default, jobs are executed sequentially. You can check out the documentation at <a href="https://excalibur-py.readthedocs.io" target="_blank">https://excalibur-py.readthedocs.io</a> for more details.</p>
              </div>
            </div>
          </div>
        </div>
      </div>
    </section>

    <!-- Usage Section -->
    <section class="bg-primary features" id="usage">
      <div class="container">
        <h2 class="text-center text-uppercase text-white mb-0">Usage</h2>
        <hr class="star-light mb-5">
        <div class="row align-items-center mb-5 text-white">
          <div class="col-md-6 order-lg-first">
            <a href="#">
              <img class="img-fluid rounded mb-3 mb-md-0" src="https://excalibur-py.readthedocs.io/en/master/_static/gifs/upload.gif" alt="">
            </a>
          </div>
          <div class="col-md-6 order-lg-last">
            <h3>Upload your PDF</h3>
            <p>You can upload your PDF using the web interface. You can also see previous uploads. All file storage and processing happens on your own local or remote machine, which means that you have complete control over your data.</p>
          </div>
        </div>
        <div class="row align-items-center mb-5 text-white">
          <div class="col-md-6 order-lg-last">
            <a href="#">
              <img class="img-fluid rounded mb-3 mb-md-0" src="https://excalibur-py.readthedocs.io/en/master/_static/gifs/auto-detect.gif" alt="">
            </a>
          </div>
          <div class="col-md-6 order-lg-first">
            <h3>Auto-detect table areas</h3>
            <p>You don't need to draw table areas and column separators in most cases, because Excalibur can do that automatically.</p>
          </div>
        </div>
        <div class="row align-items-center mb-5 text-white">
          <div class="col-md-6 order-lg-first">
            <a href="#">
              <img class="img-fluid rounded mb-3 mb-md-0" src="https://excalibur-py.readthedocs.io/en/master/_static/gifs/table-and-column.gif" alt="">
            </a>
          </div>
          <div class="col-md-6 order-lg-first">
            <h3>Or draw table areas and/or column separators</h3>
            <p>You can draw table areas and also add column separators in cases where the tables are buried deep inside the text on the page.</p>
          </div>
        </div>
        <div class="row align-items-center mb-5 text-white">
          <div class="col-md-6 order-lg-last">
            <a href="#">
              <img class="img-fluid rounded mb-3 mb-md-0" src="https://excalibur-py.readthedocs.io/en/master/_static/gifs/saved-rule.gif" alt="">
            </a>
          </div>
          <div class="col-md-6 order-lg-first">
            <h3>Or load a saved table extraction rule</h3>
            <p>Each new table extraction rule (table areas, column separators and other settings) is saved by default. You can load it next time you see a PDF with a similar table structure.</p>
          </div>
        </div>
        <div class="row align-items-center mb-5 text-white">
          <div class="col-md-6 order-lg-first">
            <a href="#">
              <img class="img-fluid rounded mb-3 mb-md-0" src="https://excalibur-py.readthedocs.io/en/master/_static/gifs/download.gif" alt="">
            </a>
          </div>
          <div class="col-md-6 order-lg-first">
            <h3>Download extracted tables in structured formats</h3>
            <p>You can view the extracted tables and then download them as CSVs or an Excel spreadsheet. Excalibur also supports JSON and HTML.</p>
          </div>
        </div>
      </div>
    </section>

    <!-- Download Section -->
    <section id="download">
      <div class="container-fluid">
        <h2 class="text-center text-uppercase text-secondary">Download</h2>
        <hr class="star-dark mb-5">
      </div>
      <div class="container">
        <div class="row">
          <div class="col-md-12 text-center mt-4">
            <h5 class="mb-1 text-accent">Available for Windows, macOS and Linux</h5>
            <p class="lead text-helper">Excalibur can be easily installed using <a href="https://en.wikipedia.org/wiki/Pip_(package_manager)">pip</a> which is a package manager for Python packages.</p>
            <div class="text-center">
              <a href="https://pypi.org/project/excalibur-py/" target="_blank">
                <img src="pip-excalibur.png" class="rounded mb-2" width="234.33">
              </a>
            </div>
            <p class="lead text-helper">Or you can just download the executable and run it directly!</p>
            <a class="btn btn-xl btn-accent" href="https://github.com/camelot-dev/excalibur/releases" target="_blank">
              <i class="fas fa-download mr-2"></i>
              Download Now!
            </a>
          </div>
        </div>
      </div>
    </section>

    <!-- Team Section -->
    <section class="bg-grey" id="team">
      <div class="container">
        <h2 class="text-center text-uppercase text-secondary mb-0">Team</h2>
        <hr class="star-grey mb-5">
        <div class="row">

          <div class="col-lg-6 col-sm-6 col-xs-12 text-center mb-4">
            <img class="rounded-circle img-fluid d-block mx-auto" height="125" width="125"
                  src="https://avatars1.githubusercontent.com/u/4329421?s=460&v=4" alt="Vinayak Mehta">
            <h3 class="mb-1 mt-4">Vinayak Mehta</h3>
            <ul class="list-inline social-icons">
              <li class="list-inline-item">
                <a href="https://www.vinayakmehta.com/about/" target="_blank">
                  <i class="fas fa-globe-asia fa-lg"></i>
                </a>
              </li>
              <li class="list-inline-item">
                <a href="https://github.com/vinayak-mehta" target="_blank">
                  <i class="fab fa-fw fa-github fa-lg"></i>
                </a>
              </li>
              <li class="list-inline-item">
                <a href="https://www.linkedin.com/in/mehtavinayak/" target="_blank">
                  <i class="fab fa-fw fa-linkedin fa-lg"></i>
                </a>
              </li>
            </ul>
          </div>

          <div class="col-lg-6 col-sm-6 col-xs-12 text-center mb-4">
            <img class="rounded-circle img-fluid d-block mx-auto" height="125" width="125"
                  src="https://media.licdn.com/dms/image/C4E03AQHxyta3vScPzA/profile-displayphoto-shrink_800_800/0?e=1546473600&v=beta&t=zMqdJEBtF-jkpfHGykbVCVRFhxXDsvxpPwhVrTJ3kHU" alt="Nikhil Sikka">
            <h3 class="mb-1 mt-4">Nikhil Sikka</h3>
            <ul class="list-inline social-icons">
              <li class="list-inline-item">
                <a href="https://github.com/n-sikka" target="_blank">
                  <i class="fab fa-fw fa-github fa-lg"></i>
                </a>
              </li>
              <li class="list-inline-item">
                <a href="https://www.linkedin.com/in/nikhilsikka/" target="_blank">
                  <i class="fab fa-fw fa-linkedin fa-lg"></i>
                </a>
              </li>
            </ul>
          </div>

        </div>
      </div>
    </section>

    <!-- Footer -->
    <footer class="footer text-center">
      <div class="container">
        <div class="row">
          <div class="col-md-12">
            <ul class="list-inline mb-0">
              <li class="list-inline-item">
                <a class="btn btn-outline-light btn-social text-center rounded-circle" href="https://github.com/camelot-dev/excalibur" target="_blank">
                  <i class="fab fa-fw fa-github"></i>
                </a>
              </li>
            </ul>
            <a class="mt-2 d-inline-block text-white" href="https://github.com/camelot-dev/excalibur" target="_blank">View on Github</a>
          </div>
        </div>
      </div>
    </footer>

    <div class="copyright py-4 text-center text-white">
      <div class="container">
        <small><p class="mb-2">Copyright <a href="https://github.com/camelot-dev/" target="_blank">&copy; Camelot Dev</a> 2018</p></small>
        <small><p>Made with <i class="fa fa-heart mx-1"></i> in New Delhi, India</p></small>
      </div>
    </div>

    <!-- Scroll to Top Button (Only visible on small and extra-small screen sizes) -->
    <div class="scroll-to-top d-lg-none position-fixed ">
      <a class="js-scroll-trigger d-block text-center text-white rounded" href="#page-top">
        <i class="fa fa-chevron-up"></i>
      </a>
    </div>

    <!-- Bootstrap core JavaScript -->
    <script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.3.1/jquery.min.js"></script>
    <script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/4.1.3/js/bootstrap.bundle.min.js"></script>

    <!-- Plugin JavaScript -->
    <script src="https://cdnjs.cloudflare.com/ajax/libs/jquery-easing/1.4.1/jquery.easing.min.js"></script>

    <!-- Place this tag in your head or just before your close body tag. -->
    <script async defer src="https://buttons.github.io/buttons.js"></script>

    <!-- Custom scripts for this template -->
    <script src="js/main.min.js"></script>

  </body>

</html>
